import  pandas as pd
import statsmodels.formula.api as smf
from sqlalchemy import create_engine
import pymysql

db_config = {
    'host': 'localhost',
    'user': 'root',
    'password': 'root',
    'database': 'tushare',
    'port': 3306,
    'charset': 'utf8'
}
engine = create_engine(f"mysql+pymysql://{db_config['user']}:{db_config['password']}@{db_config['host']}:{db_config['port']}/{db_config['database']}?charset={db_config['charset']}")
conn = pymysql.connect(**db_config)
chunk_size = 100000
df=pd.read_sql_query("SELECT * FROM date_1 d WHERE d.the_date BETWEEN '2023-01-01' AND '2023-12-31' AND d.ts_code='000001.SZ'"
                     ,conn
                     ,chunksize=chunk_size
                     )
df1 = pd.concat(df, ignore_index=True)
print(df1.head())

df1['zd_closes'] = round((df1['closes']  - df1['closes'].shift(1)) / df1['closes'].shift(1),2)
print(df1.head())

df1=df1.dropna(subset=['zd_closes'])
print(df1.head())

ex=['id','ts_code','trade_date','the_date','opens','high','low','cloese','pre_closes','changes','pct_chg','vol','amount']
number=df1.select_dtypes(include=['number']).columns.tolist()
newList = [i for i in number if i not in ex]

formula = 'zd_closes ~ ' + ' + '.join(newList)
res = smf.ols(formula, data=df1).fit()
print(res.summary())    
